package de.placidi.pressreview.parsing;

import java.io.IOException;
import java.util.List;

/**
 * 
 * The public access point in order to parse html sites. Uses the Jsoup library. 
 * 
 * @author Alexander Placidi
 *
 */
public interface HTMLParser {
	
	/**
	 * Fetches all the texts from the given website. To reduce complexity, it only collects headlines. 
	 * 
	 * @param url
	 * 		The url.
	 * @param filter
	 * 		A filter to prevent the scanner from leaving the interesting site. 
	 * @param depth
	 * 		How depth the scanner searches.
	 * @return
	 * 		A list of found texts.
	 * @throws IOException
	 */
	public List<String> getAllTexts(String url, String filter, int depth) throws IOException;
	

}
